backend(vllm): disable metrics for now

2025-09-09 19:34:53 +00:00 · 2025-01-31 10:56:54 +01:00 · 2025-01-31 10:56:54 +01:00 · 5452c1294c
commit 5452c1294c
parent 003163a2b9
2 changed files with 7 additions and 1 deletions
--- a/backends/vllm/src/backend.rs
+++ b/backends/vllm/src/backend.rs
@ -63,6 +63,12 @@ impl TryFrom<&RequestOutput> for InferStreamResponse {
                                .unwrap(),
                            seed: None,
                        },
                        // start: STARTUP_INSTANT
                        //     .checked_sub(Duration::from_secs_f32(metrics.first_scheduled_time))
                        //     .unwrap_or_else(Instant::now),
                        // queued: STARTUP_INSTANT
                        //     .checked_sub(Duration::from_secs_f32(metrics.arrival_time))
                        //     .unwrap_or_else(Instant::now),
                        start: Instant::now(),
                        queued: Instant::now(),
                    })
--- a/backends/vllm/src/lib.rs
+++ b/backends/vllm/src/lib.rs
@ -11,7 +11,7 @@ use pyo3::types::PyModule;
 use pyo3::{Py, PyAny, PyErr, PyObject, Python};
 use tokio::time::Instant;
-pub(crate) const STARTUP_INSTANT: Instant = Instant::now();
+pub(crate) static STARTUP_INSTANT: Instant = Instant::now();
 static PY_TOKENS_PROMPT_CLASS: GILOnceCell<Py<PyAny>> = GILOnceCell::new();
 static PY_SAMPLING_PARAMS_CLASS: GILOnceCell<Py<PyAny>> = GILOnceCell::new();