mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-24 16:32:12 +00:00
* Fixing odd tokenization self modifications on the Rust side (load and resave in Python). * Fixing the builds ? * Fix the gh action? * Fixing the location ? * Validation is odd. * Try a faster runner * Upgrade python version. * Remove sccache * No sccache. * Getting libpython maybe ? * List stuff. * Monkey it up. * have no idea at this point * Tmp. * Shot in the dark. * Tmate the hell out of this. * Desperation. * WTF. * -y. * Apparently 3.10 is not available anymore. * Updating the dockerfile to make libpython discoverable at runtime too. * Put back rust tests. * Why do we want mkl on AMD ? * Forcing 3.11 ?
51 lines
1.1 KiB
TOML
51 lines
1.1 KiB
TOML
[workspace]
|
|
members = [
|
|
"benchmark",
|
|
"backends/v3",
|
|
"backends/grpc-metadata",
|
|
"backends/trtllm",
|
|
"backends/client",
|
|
"launcher"
|
|
]
|
|
default-members = [
|
|
"benchmark",
|
|
"backends/v3",
|
|
"backends/grpc-metadata",
|
|
# "backends/trtllm",
|
|
"backends/client",
|
|
"launcher"
|
|
]
|
|
resolver = "2"
|
|
|
|
[workspace.package]
|
|
version = "2.2.1-dev0"
|
|
edition = "2021"
|
|
authors = ["Olivier Dehaene"]
|
|
homepage = "https://github.com/huggingface/text-generation-inference"
|
|
|
|
[workspace.dependencies]
|
|
base64 = "0.22.0"
|
|
tokenizers = { version = "0.20.0", features = ["http"] }
|
|
hf-hub = { version = "0.3.1", features = ["tokio"] }
|
|
metrics = { version = "0.23.0" }
|
|
metrics-exporter-prometheus = { version = "0.15.1", features = [] }
|
|
minijinja = { version = "2.2.0", features = ["json"] }
|
|
minijinja-contrib = { version = "2.0.2", features = ["pycompat"] }
|
|
|
|
[profile.release]
|
|
incremental = true
|
|
|
|
[profile.release-binary]
|
|
inherits = "release"
|
|
debug = 1
|
|
incremental = true
|
|
panic = "abort"
|
|
|
|
[profile.release-opt]
|
|
inherits = "release"
|
|
debug = 0
|
|
incremental = false
|
|
lto = "fat"
|
|
opt-level = 3
|
|
codegen-units = 1
|