mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-19 22:02:06 +00:00
feat: concat the adapter id to the model id in chat response (#2779)
* feat: concat the adapter id to the model id in chat response * fix: updated to include only the adapter id in chat response
This commit is contained in:
parent
780531ec77
commit
c637d68d74
@ -1228,6 +1228,7 @@ pub(crate) async fn chat_completions(
|
|||||||
let span = tracing::Span::current();
|
let span = tracing::Span::current();
|
||||||
metrics::counter!("tgi_request_count").increment(1);
|
metrics::counter!("tgi_request_count").increment(1);
|
||||||
let ChatRequest {
|
let ChatRequest {
|
||||||
|
model,
|
||||||
stream,
|
stream,
|
||||||
stream_options,
|
stream_options,
|
||||||
logprobs,
|
logprobs,
|
||||||
@ -1238,8 +1239,11 @@ pub(crate) async fn chat_completions(
|
|||||||
|
|
||||||
let logprobs = logprobs.unwrap_or_default();
|
let logprobs = logprobs.unwrap_or_default();
|
||||||
|
|
||||||
// static values that will be returned in all cases
|
// extract model id from request if specified
|
||||||
let model_id = info.model_id.clone();
|
let model_id = match model.as_deref() {
|
||||||
|
Some("tgi") | None => info.model_id.clone(),
|
||||||
|
Some(m_id) => m_id.to_string(),
|
||||||
|
};
|
||||||
let system_fingerprint = format!("{}-{}", info.version, info.docker_label.unwrap_or("native"));
|
let system_fingerprint = format!("{}-{}", info.version, info.docker_label.unwrap_or("native"));
|
||||||
// switch on stream
|
// switch on stream
|
||||||
if stream {
|
if stream {
|
||||||
|
Loading…
Reference in New Issue
Block a user