backend(vllm): disable metrics for now

This commit is contained in:
Morgan Funtowicz 2025-01-31 10:56:54 +01:00
parent 003163a2b9
commit 5452c1294c
2 changed files with 7 additions and 1 deletions

View File

@ -63,6 +63,12 @@ impl TryFrom<&RequestOutput> for InferStreamResponse {
.unwrap(),
seed: None,
},
// start: STARTUP_INSTANT
// .checked_sub(Duration::from_secs_f32(metrics.first_scheduled_time))
// .unwrap_or_else(Instant::now),
// queued: STARTUP_INSTANT
// .checked_sub(Duration::from_secs_f32(metrics.arrival_time))
// .unwrap_or_else(Instant::now),
start: Instant::now(),
queued: Instant::now(),
})

View File

@ -11,7 +11,7 @@ use pyo3::types::PyModule;
use pyo3::{Py, PyAny, PyErr, PyObject, Python};
use tokio::time::Instant;
pub(crate) const STARTUP_INSTANT: Instant = Instant::now();
pub(crate) static STARTUP_INSTANT: Instant = Instant::now();
static PY_TOKENS_PROMPT_CLASS: GILOnceCell<Py<PyAny>> = GILOnceCell::new();
static PY_SAMPLING_PARAMS_CLASS: GILOnceCell<Py<PyAny>> = GILOnceCell::new();