From 4fe79da8f3aa98b5fce2598882944828af45f59a Mon Sep 17 00:00:00 2001 From: OlivierDehaene <23298448+OlivierDehaene@users.noreply.github.com> Date: Wed, 21 Feb 2024 15:28:46 +0100 Subject: [PATCH] fix: fix openapi schema --- router/src/lib.rs | 2 +- router/src/server.rs | 12 +++++++++--- 2 files changed, 10 insertions(+), 4 deletions(-) diff --git a/router/src/lib.rs b/router/src/lib.rs index c6928a5a..113e2642 100644 --- a/router/src/lib.rs +++ b/router/src/lib.rs @@ -347,7 +347,7 @@ pub(crate) struct ChatCompletionTopLogprob { logprob: f32, } -#[derive(Clone, Deserialize, Serialize)] +#[derive(Clone, Deserialize, Serialize, ToSchema)] pub(crate) struct Usage { pub prompt_tokens: u32, pub completion_tokens: u32, diff --git a/router/src/server.rs b/router/src/server.rs index ebde7133..9fdd66cc 100644 --- a/router/src/server.rs +++ b/router/src/server.rs @@ -3,11 +3,12 @@ use crate::health::Health; use crate::infer::{InferError, InferResponse, InferStreamResponse}; use crate::validation::ValidationError; use crate::{ - BestOfSequence, ChatCompletion, ChatCompletionChoice, ChatCompletionChunk, ChatCompletionDelta, - ChatCompletionLogprobs, ChatRequest, CompatGenerateRequest, Details, ErrorResponse, + BestOfSequence, ChatCompletion, ChatCompletionChoice, ChatCompletionChunk, + ChatCompletionComplete, ChatCompletionDelta, ChatCompletionLogprob, ChatCompletionLogprobs, + ChatCompletionTopLogprob, ChatRequest, CompatGenerateRequest, Details, ErrorResponse, FinishReason, GenerateParameters, GenerateRequest, GenerateResponse, GrammarType, HubModelInfo, HubTokenizerConfig, Infer, Info, Message, PrefillToken, SimpleToken, StreamDetails, - StreamResponse, Token, TokenizeResponse, Validation, VertexRequest, VertexResponse, + StreamResponse, Token, TokenizeResponse, Usage, Validation, VertexRequest, VertexResponse, }; use axum::extract::Extension; use axum::http::{HeaderMap, Method, StatusCode}; @@ -896,9 +897,13 @@ pub async fn run( GrammarType, ChatRequest, Message, + ChatCompletionComplete, ChatCompletionChoice, ChatCompletionDelta, ChatCompletionChunk, + ChatCompletionLogprob, + ChatCompletionLogprobs, + ChatCompletionTopLogprob, ChatCompletion, GenerateParameters, PrefillToken, @@ -913,6 +918,7 @@ pub async fn run( StreamDetails, ErrorResponse, GrammarType, + Usage, ) ), tags(