From ca73b60da74e3b3a416d861dfd69dda9c36c165d Mon Sep 17 00:00:00 2001 From: OlivierDehaene <23298448+OlivierDehaene@users.noreply.github.com> Date: Mon, 13 Feb 2023 12:46:39 +0100 Subject: [PATCH] remove max sequence length --- router/client/src/client.rs | 4 ++-- router/client/src/sharded_client.rs | 4 ++-- 2 files changed, 4 insertions(+), 4 deletions(-) diff --git a/router/client/src/client.rs b/router/client/src/client.rs index 9620cf70..1f0d23f2 100644 --- a/router/client/src/client.rs +++ b/router/client/src/client.rs @@ -66,7 +66,7 @@ impl Client { /// /// Returns Generation for each request in batch /// and the next cached batch - #[instrument(skip_all, fields(id = &batch.id, size = &batch.size, max_sequence_length = batch.requests.iter().map(|request| request.input_length).max()))] + #[instrument(skip_all, fields(id = &batch.id, size = &batch.size))] pub async fn prefill(&mut self, batch: Batch) -> Result<(Vec, Option)> { let request = tonic::Request::new(PrefillRequest { batch: Some(batch) }).inject_context(); let response = self.stub.prefill(request).await?.into_inner(); @@ -77,7 +77,7 @@ impl Client { /// /// Returns Generation for each request in batches /// and the next cached batch - #[instrument(skip_all, fields(size = batches.iter().map(|batch|{batch.size}).sum::(), max_sequence_length = batches.iter().map(|batch|{batch.requests.iter().map(|request| request.input_length).max()}).max()))] + #[instrument(skip_all, fields(size = batches.iter().map(|batch|{batch.size}).sum::()))] pub async fn decode( &mut self, batches: Vec, diff --git a/router/client/src/sharded_client.rs b/router/client/src/sharded_client.rs index 3f1cd4ab..2e662ca3 100644 --- a/router/client/src/sharded_client.rs +++ b/router/client/src/sharded_client.rs @@ -53,7 +53,7 @@ impl ShardedClient { /// /// Returns Generation for each request in batch /// and the next cached batch - #[instrument(skip_all, fields(id = &batch.id, size = &batch.size, max_sequence_length = batch.requests.iter().map(|request| request.input_length).max()))] + #[instrument(skip_all, fields(id = &batch.id, size = &batch.size))] pub async fn prefill(&mut self, batch: Batch) -> Result<(Vec, Option)> { let futures: Vec<_> = self .clients @@ -69,7 +69,7 @@ impl ShardedClient { /// /// Returns Generation for each request in batches /// and the next cached batch - #[instrument(skip_all, fields(size = batches.iter().map(|batch|{batch.size}).sum::(), max_sequence_length = batches.iter().map(|batch|{batch.requests.iter().map(|request| request.input_length).max()}).max()))] + #[instrument(skip_all, fields(size = batches.iter().map(|batch|{batch.size}).sum::()))] pub async fn decode( &mut self, batches: Vec,