mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-23 07:52:06 +00:00
Co-authored-by: mswiniarsk <156412439+mswiniarsk@users.noreply.github.com>
This commit is contained in:
parent
80ae9ead28
commit
8e14780bf4
@ -463,7 +463,7 @@ fn shard_manager(
|
|||||||
envs.push(("MAX_TOTAL_TOKENS".into(), max_total_tokens.to_string().into()));
|
envs.push(("MAX_TOTAL_TOKENS".into(), max_total_tokens.to_string().into()));
|
||||||
|
|
||||||
// Torch Distributed Env vars
|
// Torch Distributed Env vars
|
||||||
if world_size == 1 {
|
if world_size == 1 {
|
||||||
envs.push(("RANK".into(), rank.to_string().into()));
|
envs.push(("RANK".into(), rank.to_string().into()));
|
||||||
}
|
}
|
||||||
envs.push(("WORLD_SIZE".into(), world_size.to_string().into()));
|
envs.push(("WORLD_SIZE".into(), world_size.to_string().into()));
|
||||||
@ -603,6 +603,7 @@ fn shard_manager(
|
|||||||
// Shard is ready
|
// Shard is ready
|
||||||
if uds.exists() && !ready {
|
if uds.exists() && !ready {
|
||||||
tracing::info!("Shard ready in {:?}", start_time.elapsed());
|
tracing::info!("Shard ready in {:?}", start_time.elapsed());
|
||||||
|
sleep(Duration::from_millis(2000));
|
||||||
status_sender.send(ShardStatus::Ready).unwrap();
|
status_sender.send(ShardStatus::Ready).unwrap();
|
||||||
ready = true;
|
ready = true;
|
||||||
} else if !ready && wait_time.elapsed() > Duration::from_secs(10) {
|
} else if !ready && wait_time.elapsed() > Duration::from_secs(10) {
|
||||||
|
@ -142,7 +142,9 @@ fn main() -> Result<(), RouterError> {
|
|||||||
// This will only be used to validate payloads
|
// This will only be used to validate payloads
|
||||||
let local_path = Path::new(&tokenizer_name);
|
let local_path = Path::new(&tokenizer_name);
|
||||||
let local_model = local_path.exists() && local_path.is_dir();
|
let local_model = local_path.exists() && local_path.is_dir();
|
||||||
let skip_tokenizer_in_tgi = env::var("SKIP_TOKENIZER_IN_TGI").ok().map_or(false, |value| value.to_lowercase() == "true");
|
let skip_tokenizer_in_tgi = env::var("SKIP_TOKENIZER_IN_TGI")
|
||||||
|
.ok()
|
||||||
|
.map_or(false, |value| value.to_lowercase() == "true");
|
||||||
let tokenizer = if skip_tokenizer_in_tgi {
|
let tokenizer = if skip_tokenizer_in_tgi {
|
||||||
None
|
None
|
||||||
} else if local_model {
|
} else if local_model {
|
||||||
|
Loading…
Reference in New Issue
Block a user