mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-10 20:04:52 +00:00
Propagate speculate
This commit is contained in:
parent
7ed07bcc05
commit
bdd9596b6c
@ -383,6 +383,7 @@ fn shard_manager(
|
||||
model_id: String,
|
||||
revision: Option<String>,
|
||||
quantize: Option<Quantization>,
|
||||
speculate: Option<usize>,
|
||||
dtype: Option<Dtype>,
|
||||
trust_remote_code: bool,
|
||||
uds_path: String,
|
||||
@ -895,6 +896,7 @@ fn spawn_shards(
|
||||
let shutdown_sender = shutdown_sender.clone();
|
||||
let otlp_endpoint = args.otlp_endpoint.clone();
|
||||
let quantize = args.quantize;
|
||||
let speculate = args.speculate;
|
||||
let dtype = args.dtype;
|
||||
let trust_remote_code = args.trust_remote_code;
|
||||
let master_port = args.master_port;
|
||||
@ -909,6 +911,7 @@ fn spawn_shards(
|
||||
model_id,
|
||||
revision,
|
||||
quantize,
|
||||
speculate,
|
||||
dtype,
|
||||
trust_remote_code,
|
||||
uds_path,
|
||||
|
Loading…
Reference in New Issue
Block a user