mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-10 11:54:52 +00:00
Adding additional response header X-Total-Tokens
This commit is contained in:
parent
b4024edd45
commit
1e62237d44
@ -55,6 +55,7 @@ export default function () {
|
||||
|
||||
if (res.status === 200) {
|
||||
totalTime.add(res.headers["X-Total-Time"]);
|
||||
totalTokens.add(res.headers["X-Total-Tokens"]);
|
||||
validationTime.add(res.headers["X-Validation-Time"]);
|
||||
queueTime.add(res.headers["X-Queue-Time"]);
|
||||
inferenceTime.add(res.headers["X-Inference-Time"]);
|
||||
|
@ -241,6 +241,10 @@ async fn generate(
|
||||
"x-total-time",
|
||||
total_time.as_millis().to_string().parse().unwrap(),
|
||||
);
|
||||
headers.insert(
|
||||
"x-total-tokens",
|
||||
response.generated_text.generated_tokens.to_string().parse().unwrap(),
|
||||
);
|
||||
headers.insert(
|
||||
"x-validation-time",
|
||||
validation_time.as_millis().to_string().parse().unwrap(),
|
||||
|
Loading…
Reference in New Issue
Block a user