diff --git a/launcher/src/main.rs b/launcher/src/main.rs index f015a393..7159ecf2 100644 --- a/launcher/src/main.rs +++ b/launcher/src/main.rs @@ -21,13 +21,13 @@ use subprocess::{ExitStatus, Popen, PopenConfig, PopenError, Redirection}; struct Args { #[clap(default_value = "bigscience/bloom-560m", long, env = "HF_MODEL_ID")] model_id: String, - #[clap(long, env)] + #[clap(long, env = "HF_MODEL_REVISION")] revision: Option, #[clap(long, env)] sharded: Option, #[clap(long, env = "SM_NUM_GPUS")] num_shard: Option, - #[clap(long, env)] + #[clap(long, env = "HF_MODEL_QUANTIZE")] quantize: bool, #[clap(default_value = "128", long, env)] max_concurrent_requests: usize,