Adding additional response header X-Total-Tokens

This commit is contained in:
Julian Bright 2023-07-11 03:17:09 +10:00
parent b4024edd45
commit 1e62237d44
2 changed files with 5 additions and 0 deletions

View File

@ -55,6 +55,7 @@ export default function () {
if (res.status === 200) {
totalTime.add(res.headers["X-Total-Time"]);
totalTokens.add(res.headers["X-Total-Tokens"]);
validationTime.add(res.headers["X-Validation-Time"]);
queueTime.add(res.headers["X-Queue-Time"]);
inferenceTime.add(res.headers["X-Inference-Time"]);

View File

@ -241,6 +241,10 @@ async fn generate(
"x-total-time",
total_time.as_millis().to_string().parse().unwrap(),
);
headers.insert(
"x-total-tokens",
response.generated_text.generated_tokens.to_string().parse().unwrap(),
);
headers.insert(
"x-validation-time",
validation_time.as_millis().to_string().parse().unwrap(),