mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-12 12:54:52 +00:00
fix: remove dev debug trait and unneeded mut
This commit is contained in:
parent
515cd66705
commit
e57b6cccda
@ -1211,7 +1211,7 @@ pub(crate) struct ChatTokenizeResponse {
|
|||||||
#[serde(transparent)]
|
#[serde(transparent)]
|
||||||
pub(crate) struct TokenizeResponse(Vec<SimpleToken>);
|
pub(crate) struct TokenizeResponse(Vec<SimpleToken>);
|
||||||
|
|
||||||
#[derive(Serialize, ToSchema, Debug)]
|
#[derive(Serialize, ToSchema)]
|
||||||
pub(crate) struct StreamDetails {
|
pub(crate) struct StreamDetails {
|
||||||
#[schema(example = "length")]
|
#[schema(example = "length")]
|
||||||
pub finish_reason: FinishReason,
|
pub finish_reason: FinishReason,
|
||||||
@ -1223,7 +1223,7 @@ pub(crate) struct StreamDetails {
|
|||||||
pub input_length: u32,
|
pub input_length: u32,
|
||||||
}
|
}
|
||||||
|
|
||||||
#[derive(Serialize, ToSchema, Debug)]
|
#[derive(Serialize, ToSchema)]
|
||||||
pub(crate) struct StreamResponse {
|
pub(crate) struct StreamResponse {
|
||||||
pub index: u32,
|
pub index: u32,
|
||||||
pub token: Token,
|
pub token: Token,
|
||||||
|
@ -533,7 +533,7 @@ async fn generate_stream_internal(
|
|||||||
} else {
|
} else {
|
||||||
match infer.generate_stream(req).instrument(info_span!(parent: &span, "async_stream")).await {
|
match infer.generate_stream(req).instrument(info_span!(parent: &span, "async_stream")).await {
|
||||||
// Keep permit as long as generate_stream lives
|
// Keep permit as long as generate_stream lives
|
||||||
Ok((_permit, input_length, mut response_stream)) => {
|
Ok((_permit, input_length, response_stream)) => {
|
||||||
let mut index = 0;
|
let mut index = 0;
|
||||||
let mut response_stream = Box::pin(response_stream);
|
let mut response_stream = Box::pin(response_stream);
|
||||||
// Server-Sent Event stream
|
// Server-Sent Event stream
|
||||||
|
Loading…
Reference in New Issue
Block a user