mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 20:34:54 +00:00
adding max_token_capacity_metric
This commit is contained in:
parent
d1f257ac56
commit
3e76ba6599
@ -1993,6 +1993,8 @@ async fn start(
|
||||
"Batch size of the next batch"
|
||||
);
|
||||
|
||||
metrics::counter!("max_token_capacity").increment(u64::from(max_batch_total_tokens));
|
||||
|
||||
// CORS layer
|
||||
let allow_origin = allow_origin.unwrap_or(AllowOrigin::any());
|
||||
let cors_layer = CorsLayer::new()
|
||||
|
Loading…
Reference in New Issue
Block a user