mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-12 04:44:52 +00:00
adding max_token_capacity_metric
This commit is contained in:
parent
d1f257ac56
commit
3e76ba6599
@ -1993,6 +1993,8 @@ async fn start(
|
|||||||
"Batch size of the next batch"
|
"Batch size of the next batch"
|
||||||
);
|
);
|
||||||
|
|
||||||
|
metrics::counter!("max_token_capacity").increment(u64::from(max_batch_total_tokens));
|
||||||
|
|
||||||
// CORS layer
|
// CORS layer
|
||||||
let allow_origin = allow_origin.unwrap_or(AllowOrigin::any());
|
let allow_origin = allow_origin.unwrap_or(AllowOrigin::any());
|
||||||
let cors_layer = CorsLayer::new()
|
let cors_layer = CorsLayer::new()
|
||||||
|
Loading…
Reference in New Issue
Block a user