diff --git a/router/src/server.rs b/router/src/server.rs index b8c67b2c4..dd8bc8741 100644 --- a/router/src/server.rs +++ b/router/src/server.rs @@ -351,6 +351,7 @@ async fn generate_stream( "x-compute-characters", compute_characters.to_string().parse().unwrap(), ); + headers.insert("X-Accel-Buffering", "no".parse().unwrap()); let stream = async_stream::stream! { // Inference