mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 12:24:53 +00:00
fix: adjust protos and router
This commit is contained in:
parent
ffc228831c
commit
8413cc45ec
@ -45,7 +45,7 @@ pub async fn run(
|
|||||||
repetition_penalty: repetition_penalty.unwrap_or(1.0),
|
repetition_penalty: repetition_penalty.unwrap_or(1.0),
|
||||||
frequency_penalty: frequency_penalty.unwrap_or(0.0),
|
frequency_penalty: frequency_penalty.unwrap_or(0.0),
|
||||||
watermark,
|
watermark,
|
||||||
fsm_grammar_state: Vec::new(),
|
fsm_grammar_state: 0,
|
||||||
};
|
};
|
||||||
|
|
||||||
// Initialize terminal properties
|
// Initialize terminal properties
|
||||||
|
@ -71,9 +71,9 @@ message NextTokenChooserParameters {
|
|||||||
/// token watermarking using "A Watermark for Large Language Models"
|
/// token watermarking using "A Watermark for Large Language Models"
|
||||||
bool watermark = 8;
|
bool watermark = 8;
|
||||||
/// grammar (applied if not empty)
|
/// grammar (applied if not empty)
|
||||||
repeated string grammar = 10;
|
string grammar = 10;
|
||||||
/// fsm_grammar_state
|
/// fsm_grammar_state
|
||||||
repeated uint32 fsm_grammar_state = 11;
|
uint32 fsm_grammar_state = 11;
|
||||||
}
|
}
|
||||||
|
|
||||||
message StoppingCriteriaParameters {
|
message StoppingCriteriaParameters {
|
||||||
|
@ -128,8 +128,8 @@ impl Client {
|
|||||||
repetition_penalty: 1.2,
|
repetition_penalty: 1.2,
|
||||||
frequency_penalty: 0.1,
|
frequency_penalty: 0.1,
|
||||||
watermark: true,
|
watermark: true,
|
||||||
grammar: Vec::new(),
|
grammar: String::new(),
|
||||||
fsm_grammar_state: Vec::new(),
|
fsm_grammar_state: 0,
|
||||||
}),
|
}),
|
||||||
stopping_parameters: Some(StoppingCriteriaParameters {
|
stopping_parameters: Some(StoppingCriteriaParameters {
|
||||||
max_new_tokens: max_total_tokens - truncate,
|
max_new_tokens: max_total_tokens - truncate,
|
||||||
|
@ -45,8 +45,8 @@ impl Health {
|
|||||||
repetition_penalty: 1.0,
|
repetition_penalty: 1.0,
|
||||||
frequency_penalty: 0.0,
|
frequency_penalty: 0.0,
|
||||||
watermark: false,
|
watermark: false,
|
||||||
grammar: Vec::new(),
|
grammar: String::new(),
|
||||||
fsm_grammar_state: Vec::new(),
|
fsm_grammar_state: 0,
|
||||||
}),
|
}),
|
||||||
stopping_parameters: Some(StoppingCriteriaParameters {
|
stopping_parameters: Some(StoppingCriteriaParameters {
|
||||||
max_new_tokens: 1,
|
max_new_tokens: 1,
|
||||||
|
@ -368,8 +368,8 @@ mod tests {
|
|||||||
repetition_penalty: 0.0,
|
repetition_penalty: 0.0,
|
||||||
frequency_penalty: 0.0,
|
frequency_penalty: 0.0,
|
||||||
watermark: false,
|
watermark: false,
|
||||||
grammar: Vec::new(),
|
grammar: String::new(),
|
||||||
fsm_grammar_state: Vec::new(),
|
fsm_grammar_state: 0,
|
||||||
},
|
},
|
||||||
stopping_parameters: StoppingCriteriaParameters {
|
stopping_parameters: StoppingCriteriaParameters {
|
||||||
ignore_eos_token: false,
|
ignore_eos_token: false,
|
||||||
|
@ -294,9 +294,9 @@ impl Validation {
|
|||||||
.await?;
|
.await?;
|
||||||
|
|
||||||
// initialize the grammar parameter
|
// initialize the grammar parameter
|
||||||
let grammar = vec![grammar];
|
let grammar = grammar;
|
||||||
// init the start state of the grammar
|
// init the start state of the grammar
|
||||||
let fsm_grammar_state = vec![0];
|
let fsm_grammar_state = 0;
|
||||||
|
|
||||||
let parameters = NextTokenChooserParameters {
|
let parameters = NextTokenChooserParameters {
|
||||||
temperature,
|
temperature,
|
||||||
|
Loading…
Reference in New Issue
Block a user