This commit is contained in:
Nicolas Patry 2025-04-18 13:07:18 +02:00 committed by GitHub
parent 95ccba3705
commit 8f8819795f
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -67,16 +67,26 @@ pub(crate) async fn sagemaker_compatibility(
default_return_full_text: Extension<bool>, default_return_full_text: Extension<bool>,
infer: Extension<Infer>, infer: Extension<Infer>,
compute_type: Extension<ComputeType>, compute_type: Extension<ComputeType>,
context: Extension<Option<opentelemetry::Context>>,
info: Extension<Info>, info: Extension<Info>,
Json(req): Json<SagemakerRequest>, Json(req): Json<SagemakerRequest>,
) -> Result<Response, (StatusCode, Json<ErrorResponse>)> { ) -> Result<Response, (StatusCode, Json<ErrorResponse>)> {
match req { match req {
SagemakerRequest::Generate(req) => { SagemakerRequest::Generate(req) => {
compat_generate(default_return_full_text, infer, compute_type, Json(req)).await compat_generate(
default_return_full_text,
infer,
compute_type,
context,
Json(req),
)
.await
}
SagemakerRequest::Chat(req) => {
chat_completions(infer, compute_type, info, context, Json(req)).await
} }
SagemakerRequest::Chat(req) => chat_completions(infer, compute_type, info, Json(req)).await,
SagemakerRequest::Completion(req) => { SagemakerRequest::Completion(req) => {
completions(infer, compute_type, info, Json(req)).await completions(infer, compute_type, info, context, Json(req)).await
} }
} }
} }