From bdd9596b6cfeed5ef61629d6d5904d24a08b13cc Mon Sep 17 00:00:00 2001 From: Nicolas Patry Date: Mon, 4 Dec 2023 13:50:59 +0000 Subject: [PATCH] Propagate speculate --- launcher/src/main.rs | 3 +++ 1 file changed, 3 insertions(+) diff --git a/launcher/src/main.rs b/launcher/src/main.rs index b923fcea..3545c005 100644 --- a/launcher/src/main.rs +++ b/launcher/src/main.rs @@ -383,6 +383,7 @@ fn shard_manager( model_id: String, revision: Option, quantize: Option, + speculate: Option, dtype: Option, trust_remote_code: bool, uds_path: String, @@ -895,6 +896,7 @@ fn spawn_shards( let shutdown_sender = shutdown_sender.clone(); let otlp_endpoint = args.otlp_endpoint.clone(); let quantize = args.quantize; + let speculate = args.speculate; let dtype = args.dtype; let trust_remote_code = args.trust_remote_code; let master_port = args.master_port; @@ -909,6 +911,7 @@ fn spawn_shards( model_id, revision, quantize, + speculate, dtype, trust_remote_code, uds_path,