diff --git a/backends/trtllm/Cargo.toml b/backends/trtllm/Cargo.toml index 5d907109..b6c39346 100644 --- a/backends/trtllm/Cargo.toml +++ b/backends/trtllm/Cargo.toml @@ -7,20 +7,16 @@ homepage.workspace = true [dependencies] async-trait = "0.1" -#async-stream = "0.3" clap = { version = "4.5", features = ["derive"] } cxx = "1.0" -hashbrown = "0.14" +hashbrown = "0.15" hf-hub = { workspace = true } -#log = { version = "0.4", features = [] } text-generation-router = { path = "../../router" } tokenizers = { workspace = true } -tokio = { version = "1.39", features = ["rt", "rt-multi-thread", "parking_lot", "signal", "sync"] } -tokio-stream = "0.1.15" +tokio = { version = "1.43.0", features = ["rt", "rt-multi-thread", "parking_lot", "signal", "sync"] } +tokio-stream = "0.1.17" thiserror = "1.0.63" tracing = "0.1" -#tracing-opentelemetry = "0.25" -#tracing-subscriber = { version = "0.3", features = ["json", "env-filter"] } pyo3 = { workspace = true } [build-dependencies] diff --git a/backends/trtllm/src/looper.rs b/backends/trtllm/src/looper.rs index 43f23242..b148ec30 100644 --- a/backends/trtllm/src/looper.rs +++ b/backends/trtllm/src/looper.rs @@ -10,7 +10,7 @@ use tokio::sync::TryAcquireError; use tokio::task::spawn_blocking; use tokio::time::Instant; use tokio_stream::wrappers::UnboundedReceiverStream; -use tracing::{debug, error, info, warn}; +use tracing::{debug, error, warn}; use text_generation_router::infer::InferError::{GenerationError, ValidationError}; use text_generation_router::infer::{Backend, GeneratedText, InferError, InferStreamResponse};