It's find in some machine. using hf_hub::api::sync::Api to download config is not successful which will make warmup fail since attribute like max_position_embeddings could not be got. update hf-hub to the latest version could fix it

Signed-off-by: Wang, Yi A <yi.a.wang@intel.com>
This commit is contained in:
Wang, Yi A 2025-02-08 13:56:58 +00:00
parent 4b8cda684b
commit b7d86e8e53
3 changed files with 159 additions and 36 deletions

191
Cargo.lock generated
View File

@ -594,7 +594,7 @@ dependencies = [
"semver", "semver",
"serde", "serde",
"serde_json", "serde_json",
"thiserror", "thiserror 1.0.69",
] ]
[[package]] [[package]]
@ -1629,7 +1629,29 @@ dependencies = [
"reqwest 0.11.27", "reqwest 0.11.27",
"serde", "serde",
"serde_json", "serde_json",
"thiserror", "thiserror 1.0.69",
"tokio",
"ureq",
]
[[package]]
name = "hf-hub"
version = "0.4.1"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "112fa2f6ad4ab815b9e1b938b4b1e437032d055e2f92ed10fd6ab2e62d02c6b6"
dependencies = [
"dirs",
"futures",
"http 1.1.0",
"indicatif",
"log",
"native-tls",
"num_cpus",
"rand",
"reqwest 0.12.9",
"serde",
"serde_json",
"thiserror 2.0.11",
"tokio", "tokio",
"ureq", "ureq",
] ]
@ -1811,6 +1833,22 @@ dependencies = [
"tokio-native-tls", "tokio-native-tls",
] ]
[[package]]
name = "hyper-tls"
version = "0.6.0"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "70206fc6890eaca9fde8a0bf71caa2ddfc9fe045ac9e5c70df101a7dbde866e0"
dependencies = [
"bytes",
"http-body-util",
"hyper 1.5.1",
"hyper-util",
"native-tls",
"tokio",
"tokio-native-tls",
"tower-service",
]
[[package]] [[package]]
name = "hyper-util" name = "hyper-util"
version = "0.1.10" version = "0.1.10"
@ -2085,7 +2123,7 @@ checksum = "94bd26b1b737bc11f183620072e188d1c6ede67e0e78682228d66b49ec510e17"
dependencies = [ dependencies = [
"opentelemetry 0.20.0", "opentelemetry 0.20.0",
"opentelemetry-otlp", "opentelemetry-otlp",
"thiserror", "thiserror 1.0.69",
"tracing", "tracing",
"tracing-opentelemetry 0.21.0", "tracing-opentelemetry 0.21.0",
] ]
@ -2421,7 +2459,7 @@ dependencies = [
"metrics", "metrics",
"metrics-util", "metrics-util",
"quanta", "quanta",
"thiserror", "thiserror 1.0.69",
"tokio", "tokio",
"tracing", "tracing",
] ]
@ -2552,7 +2590,7 @@ dependencies = [
"futures", "futures",
"pin-project", "pin-project",
"rand", "rand",
"thiserror", "thiserror 1.0.69",
"tokio", "tokio",
"tokio-util", "tokio-util",
"tracing", "tracing",
@ -2601,10 +2639,10 @@ dependencies = [
"once_cell", "once_cell",
"parking_lot", "parking_lot",
"regex", "regex",
"rustls-pemfile", "rustls-pemfile 1.0.4",
"serde", "serde",
"serde_json", "serde_json",
"thiserror", "thiserror 1.0.69",
"tokio", "tokio",
"tokio-retry", "tokio-retry",
"tokio-util", "tokio-util",
@ -2908,7 +2946,7 @@ dependencies = [
"js-sys", "js-sys",
"once_cell", "once_cell",
"pin-project-lite", "pin-project-lite",
"thiserror", "thiserror 1.0.69",
"urlencoding", "urlencoding",
] ]
@ -2926,7 +2964,7 @@ dependencies = [
"opentelemetry_api", "opentelemetry_api",
"opentelemetry_sdk 0.20.0", "opentelemetry_sdk 0.20.0",
"prost 0.11.9", "prost 0.11.9",
"thiserror", "thiserror 1.0.69",
"tokio", "tokio",
"tonic 0.9.2", "tonic 0.9.2",
] ]
@ -2964,7 +3002,7 @@ dependencies = [
"js-sys", "js-sys",
"once_cell", "once_cell",
"pin-project-lite", "pin-project-lite",
"thiserror", "thiserror 1.0.69",
"urlencoding", "urlencoding",
] ]
@ -2986,7 +3024,7 @@ dependencies = [
"rand", "rand",
"regex", "regex",
"serde_json", "serde_json",
"thiserror", "thiserror 1.0.69",
"tokio", "tokio",
"tokio-stream", "tokio-stream",
] ]
@ -3008,7 +3046,7 @@ dependencies = [
"ordered-float 4.5.0", "ordered-float 4.5.0",
"percent-encoding", "percent-encoding",
"rand", "rand",
"thiserror", "thiserror 1.0.69",
] ]
[[package]] [[package]]
@ -3545,7 +3583,7 @@ dependencies = [
"rand_chacha", "rand_chacha",
"simd_helpers", "simd_helpers",
"system-deps", "system-deps",
"thiserror", "thiserror 1.0.69",
"v_frame", "v_frame",
"wasm-bindgen", "wasm-bindgen",
] ]
@ -3622,7 +3660,7 @@ checksum = "ba009ff324d1fc1b900bd1fdb31564febe58a8ccc8a6fdbb93b543d33b13ca43"
dependencies = [ dependencies = [
"getrandom", "getrandom",
"libredox", "libredox",
"thiserror", "thiserror 1.0.69",
] ]
[[package]] [[package]]
@ -3717,7 +3755,7 @@ dependencies = [
"http 0.2.12", "http 0.2.12",
"http-body 0.4.6", "http-body 0.4.6",
"hyper 0.14.31", "hyper 0.14.31",
"hyper-tls", "hyper-tls 0.5.0",
"ipnet", "ipnet",
"js-sys", "js-sys",
"log", "log",
@ -3726,12 +3764,12 @@ dependencies = [
"once_cell", "once_cell",
"percent-encoding", "percent-encoding",
"pin-project-lite", "pin-project-lite",
"rustls-pemfile", "rustls-pemfile 1.0.4",
"serde", "serde",
"serde_json", "serde_json",
"serde_urlencoded", "serde_urlencoded",
"sync_wrapper 0.1.2", "sync_wrapper 0.1.2",
"system-configuration", "system-configuration 0.5.1",
"tokio", "tokio",
"tokio-native-tls", "tokio-native-tls",
"tower-service", "tower-service",
@ -3750,30 +3788,40 @@ checksum = "a77c62af46e79de0a562e1a9849205ffcb7fc1238876e9bd743357570e04046f"
dependencies = [ dependencies = [
"base64 0.22.1", "base64 0.22.1",
"bytes", "bytes",
"encoding_rs",
"futures-channel", "futures-channel",
"futures-core", "futures-core",
"futures-util", "futures-util",
"h2 0.4.7",
"http 1.1.0", "http 1.1.0",
"http-body 1.0.1", "http-body 1.0.1",
"http-body-util", "http-body-util",
"hyper 1.5.1", "hyper 1.5.1",
"hyper-rustls",
"hyper-tls 0.6.0",
"hyper-util", "hyper-util",
"ipnet", "ipnet",
"js-sys", "js-sys",
"log", "log",
"mime", "mime",
"native-tls",
"once_cell", "once_cell",
"percent-encoding", "percent-encoding",
"pin-project-lite", "pin-project-lite",
"rustls-pemfile 2.2.0",
"serde", "serde",
"serde_json", "serde_json",
"serde_urlencoded", "serde_urlencoded",
"sync_wrapper 1.0.2", "sync_wrapper 1.0.2",
"system-configuration 0.6.1",
"tokio", "tokio",
"tokio-native-tls",
"tokio-util",
"tower-service", "tower-service",
"url", "url",
"wasm-bindgen", "wasm-bindgen",
"wasm-bindgen-futures", "wasm-bindgen-futures",
"wasm-streams",
"web-sys", "web-sys",
"windows-registry", "windows-registry",
] ]
@ -3944,6 +3992,15 @@ dependencies = [
"base64 0.21.7", "base64 0.21.7",
] ]
[[package]]
name = "rustls-pemfile"
version = "2.2.0"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "dce314e5fee3f39953d46bb63bb8a46d40c2f8fb7cc5a3b6cab2bde9721d6e50"
dependencies = [
"rustls-pki-types",
]
[[package]] [[package]]
name = "rustls-pki-types" name = "rustls-pki-types"
version = "1.10.0" version = "1.10.0"
@ -4254,6 +4311,17 @@ dependencies = [
"windows-sys 0.52.0", "windows-sys 0.52.0",
] ]
[[package]]
name = "socks"
version = "0.3.4"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "f0c3dbbd9ae980613c6dd8e28a9407b50509d3803b57624d5dfe8315218cd58b"
dependencies = [
"byteorder",
"libc",
"winapi",
]
[[package]] [[package]]
name = "spin" name = "spin"
version = "0.5.2" version = "0.5.2"
@ -4395,7 +4463,18 @@ checksum = "ba3a3adc5c275d719af8cb4272ea1c4a6d668a777f37e115f6d11ddbc1c8e0e7"
dependencies = [ dependencies = [
"bitflags 1.3.2", "bitflags 1.3.2",
"core-foundation 0.9.4", "core-foundation 0.9.4",
"system-configuration-sys", "system-configuration-sys 0.5.0",
]
[[package]]
name = "system-configuration"
version = "0.6.1"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "3c879d448e9d986b661742763247d3693ed13609438cf3d006f51f5368a5ba6b"
dependencies = [
"bitflags 2.6.0",
"core-foundation 0.9.4",
"system-configuration-sys 0.6.0",
] ]
[[package]] [[package]]
@ -4408,6 +4487,16 @@ dependencies = [
"libc", "libc",
] ]
[[package]]
name = "system-configuration-sys"
version = "0.6.0"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "8e1d1b10ced5ca923a1fcb8d03e96b8d3268065d724548c0211415ff6ac6bac4"
dependencies = [
"core-foundation-sys",
"libc",
]
[[package]] [[package]]
name = "system-deps" name = "system-deps"
version = "6.2.2" version = "6.2.2"
@ -4483,11 +4572,11 @@ dependencies = [
"cxx", "cxx",
"cxx-build", "cxx-build",
"hashbrown 0.15.1", "hashbrown 0.15.1",
"hf-hub", "hf-hub 0.3.2",
"pkg-config", "pkg-config",
"pyo3", "pyo3",
"text-generation-router", "text-generation-router",
"thiserror", "thiserror 1.0.69",
"tokenizers", "tokenizers",
"tokio", "tokio",
"tokio-stream", "tokio-stream",
@ -4501,13 +4590,13 @@ dependencies = [
"average", "average",
"clap 4.5.21", "clap 4.5.21",
"float-ord", "float-ord",
"hf-hub", "hf-hub 0.3.2",
"ratatui", "ratatui",
"serde", "serde",
"serde_json", "serde_json",
"tabled", "tabled",
"text-generation-client", "text-generation-client",
"thiserror", "thiserror 1.0.69",
"tokenizers", "tokenizers",
"tokio", "tokio",
"tracing", "tracing",
@ -4524,7 +4613,7 @@ dependencies = [
"grpc-metadata", "grpc-metadata",
"prost 0.12.6", "prost 0.12.6",
"prost-build", "prost-build",
"thiserror", "thiserror 1.0.69",
"tokio", "tokio",
"tonic 0.10.2", "tonic 0.10.2",
"tonic-build", "tonic-build",
@ -4539,7 +4628,7 @@ dependencies = [
"clap 4.5.21", "clap 4.5.21",
"ctrlc", "ctrlc",
"float_eq", "float_eq",
"hf-hub", "hf-hub 0.4.1",
"nix 0.28.0", "nix 0.28.0",
"once_cell", "once_cell",
"pyo3", "pyo3",
@ -4547,7 +4636,7 @@ dependencies = [
"reqwest 0.11.27", "reqwest 0.11.27",
"serde", "serde",
"serde_json", "serde_json",
"thiserror", "thiserror 1.0.69",
"tracing", "tracing",
"tracing-subscriber", "tracing-subscriber",
"vergen", "vergen",
@ -4568,7 +4657,7 @@ dependencies = [
"csv", "csv",
"futures", "futures",
"futures-util", "futures-util",
"hf-hub", "hf-hub 0.3.2",
"image", "image",
"init-tracing-opentelemetry", "init-tracing-opentelemetry",
"itertools 0.10.5", "itertools 0.10.5",
@ -4590,7 +4679,7 @@ dependencies = [
"serde", "serde",
"serde_json", "serde_json",
"sysinfo", "sysinfo",
"thiserror", "thiserror 1.0.69",
"tokenizers", "tokenizers",
"tokio", "tokio",
"tokio-stream", "tokio-stream",
@ -4618,7 +4707,7 @@ dependencies = [
"futures", "futures",
"futures-util", "futures-util",
"grpc-metadata", "grpc-metadata",
"hf-hub", "hf-hub 0.3.2",
"image", "image",
"init-tracing-opentelemetry", "init-tracing-opentelemetry",
"jsonschema", "jsonschema",
@ -4639,7 +4728,7 @@ dependencies = [
"serde_json", "serde_json",
"slotmap", "slotmap",
"text-generation-router", "text-generation-router",
"thiserror", "thiserror 1.0.69",
"tokenizers", "tokenizers",
"tokio", "tokio",
"tokio-stream", "tokio-stream",
@ -4668,7 +4757,7 @@ dependencies = [
"futures", "futures",
"futures-util", "futures-util",
"grpc-metadata", "grpc-metadata",
"hf-hub", "hf-hub 0.3.2",
"image", "image",
"init-tracing-opentelemetry", "init-tracing-opentelemetry",
"itertools 0.13.0", "itertools 0.13.0",
@ -4690,7 +4779,7 @@ dependencies = [
"serde_json", "serde_json",
"slotmap", "slotmap",
"text-generation-router", "text-generation-router",
"thiserror", "thiserror 1.0.69",
"tokenizers", "tokenizers",
"tokio", "tokio",
"tokio-stream", "tokio-stream",
@ -4720,7 +4809,16 @@ version = "1.0.69"
source = "registry+https://github.com/rust-lang/crates.io-index" source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "b6aaf5339b578ea85b50e080feb250a3e8ae8cfcdff9a461c9ec2904bc923f52" checksum = "b6aaf5339b578ea85b50e080feb250a3e8ae8cfcdff9a461c9ec2904bc923f52"
dependencies = [ dependencies = [
"thiserror-impl", "thiserror-impl 1.0.69",
]
[[package]]
name = "thiserror"
version = "2.0.11"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "d452f284b73e6d76dd36758a0c8684b1d5be31f92b89d07fd5822175732206fc"
dependencies = [
"thiserror-impl 2.0.11",
] ]
[[package]] [[package]]
@ -4734,6 +4832,17 @@ dependencies = [
"syn 2.0.89", "syn 2.0.89",
] ]
[[package]]
name = "thiserror-impl"
version = "2.0.11"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "26afc1baea8a989337eeb52b6e72a039780ce45c3edfcc9c5b9d112feeb173c2"
dependencies = [
"proc-macro2",
"quote",
"syn 2.0.89",
]
[[package]] [[package]]
name = "thread_local" name = "thread_local"
version = "1.1.8" version = "1.1.8"
@ -4818,7 +4927,7 @@ dependencies = [
"derive_builder", "derive_builder",
"esaxx-rs", "esaxx-rs",
"getrandom", "getrandom",
"hf-hub", "hf-hub 0.3.2",
"indicatif", "indicatif",
"itertools 0.12.1", "itertools 0.12.1",
"lazy_static", "lazy_static",
@ -4835,7 +4944,7 @@ dependencies = [
"serde", "serde",
"serde_json", "serde_json",
"spm_precompiled", "spm_precompiled",
"thiserror", "thiserror 1.0.69",
"unicode-normalization-alignments", "unicode-normalization-alignments",
"unicode-segmentation", "unicode-segmentation",
"unicode_categories", "unicode_categories",
@ -5337,6 +5446,7 @@ dependencies = [
"rustls-webpki", "rustls-webpki",
"serde", "serde",
"serde_json", "serde_json",
"socks",
"url", "url",
"webpki-roots", "webpki-roots",
] ]
@ -5599,6 +5709,19 @@ version = "0.2.95"
source = "registry+https://github.com/rust-lang/crates.io-index" source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "65fc09f10666a9f147042251e0dda9c18f166ff7de300607007e96bdebc1068d" checksum = "65fc09f10666a9f147042251e0dda9c18f166ff7de300607007e96bdebc1068d"
[[package]]
name = "wasm-streams"
version = "0.4.2"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "15053d8d85c7eccdbefef60f06769760a563c7f0a9d6902a13d35c7800b0ad65"
dependencies = [
"futures-util",
"js-sys",
"wasm-bindgen",
"wasm-bindgen-futures",
"web-sys",
]
[[package]] [[package]]
name = "web-sys" name = "web-sys"
version = "0.3.72" version = "0.3.72"

View File

@ -162,7 +162,7 @@ ARG MAMBA_VERSION=23.1.0-1
ARG PYTHON_VERSION='3.11.10' ARG PYTHON_VERSION='3.11.10'
# Automatically set by buildx # Automatically set by buildx
ARG TARGETPLATFORM ARG TARGETPLATFORM
ENV PATH /opt/conda/bin:$PATH ENV PATH=/opt/conda/bin:$PATH
# TGI seem to require libssl.so.1.1 instead of libssl.so.3 so we can't use ubuntu 22.04. Ubuntu 20.04 has python==3.8, and TGI requires python>=3.9, hence the need for miniconda. # TGI seem to require libssl.so.1.1 instead of libssl.so.3 so we can't use ubuntu 22.04. Ubuntu 20.04 has python==3.8, and TGI requires python>=3.9, hence the need for miniconda.
# Install mamba # Install mamba

View File

@ -9,7 +9,7 @@ homepage.workspace = true
[dependencies] [dependencies]
clap = { version = "4.4.5", features = ["derive", "env"] } clap = { version = "4.4.5", features = ["derive", "env"] }
ctrlc = { version = "3.4.1", features = ["termination"] } ctrlc = { version = "3.4.1", features = ["termination"] }
hf-hub = "0.3.2" hf-hub = "0.4.1"
nix = { version = "0.28.0", features = ["signal"] } nix = { version = "0.28.0", features = ["signal"] }
once_cell = "1.19.0" once_cell = "1.19.0"
pyo3 = { workspace = true } pyo3 = { workspace = true }