mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-09 11:24:53 +00:00
enable hf-transfer even with num-shard==1
This commit is contained in:
parent
3bf5c2dd65
commit
c510c30a17
@ -471,6 +471,9 @@ fn shard_manager(
|
|||||||
// Safetensors load fast
|
// Safetensors load fast
|
||||||
env.push(("SAFETENSORS_FAST_GPU".into(), "1".into()));
|
env.push(("SAFETENSORS_FAST_GPU".into(), "1".into()));
|
||||||
|
|
||||||
|
// Enable hf transfer for insane download speeds
|
||||||
|
env.push(("HF_HUB_ENABLE_HF_TRANSFER".into(), "1".into()));
|
||||||
|
|
||||||
// If huggingface_hub_cache is some, pass it to the shard
|
// If huggingface_hub_cache is some, pass it to the shard
|
||||||
// Useful when running inside a docker container
|
// Useful when running inside a docker container
|
||||||
if let Some(huggingface_hub_cache) = huggingface_hub_cache {
|
if let Some(huggingface_hub_cache) = huggingface_hub_cache {
|
||||||
|
Loading…
Reference in New Issue
Block a user