diff --git a/backends/trtllm/src/backend.rs b/backends/trtllm/src/backend.rs index 4696a964..4b92fe01 100644 --- a/backends/trtllm/src/backend.rs +++ b/backends/trtllm/src/backend.rs @@ -103,13 +103,13 @@ impl TensorRtLlmBackend { pub fn new + Send + 'static, PP: AsRef + Send + 'static>( tokenizer: Tokenizer, engine_folder: P, - _executor_worker_path: Option, + executor_worker_path: PP, ) -> Result { Ok(TensorRtLlmBackend { tokenizer: Arc::new(tokenizer), backend: Arc::new(RwLock::new(create_tensorrt_llm_backend( engine_folder.as_ref().to_str().unwrap(), - "", + executor_worker_path.as_ref().to_str().unwrap(), ))), }) } diff --git a/backends/trtllm/src/main.rs b/backends/trtllm/src/main.rs index 5d989feb..013b4ad9 100644 --- a/backends/trtllm/src/main.rs +++ b/backends/trtllm/src/main.rs @@ -56,12 +56,8 @@ struct Args { max_client_batch_size: usize, #[clap(long, env)] auth_token: Option, - #[clap( - long, - env, - help = "Path to the TensorRT-LLM Orchestrator Worker binary" - )] - executor_worker: Option, + #[clap(long, env, help = "Path to the TensorRT-LLM Orchestrator worker")] + executor_worker: PathBuf, } #[tokio::main] @@ -123,13 +119,11 @@ async fn main() -> Result<(), TensorRtLlmBackendError> { } } - if let Some(ref executor_worker) = executor_worker { - if !executor_worker.exists() { - return Err(TensorRtLlmBackendError::ArgumentValidation(format!( - "`executor_work` specified path doesn't exists: {}", - executor_worker.display() - ))); - } + if !executor_worker.exists() { + return Err(TensorRtLlmBackendError::ArgumentValidation(format!( + "`executor_work` specified path doesn't exists: {}", + executor_worker.display() + ))); } // Run server