From c0df99e704082749e47d5588a23e0f00f6529aae Mon Sep 17 00:00:00 2001 From: OlivierDehaene <23298448+OlivierDehaene@users.noreply.github.com> Date: Fri, 21 Apr 2023 19:48:41 +0200 Subject: [PATCH] fix(server): fix flash causal --- server/text_generation_server/models/flash_causal_lm.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/server/text_generation_server/models/flash_causal_lm.py b/server/text_generation_server/models/flash_causal_lm.py index c44dd57d..f332ab51 100644 --- a/server/text_generation_server/models/flash_causal_lm.py +++ b/server/text_generation_server/models/flash_causal_lm.py @@ -225,6 +225,7 @@ class FlashCausalLMBatch(Batch): return FlashCausalLMBatch( batch_id=self.batch_id, + past_pad=self.past_pad, requests=requests, requests_idx_mapping=requests_idx_mapping, input_ids=input_ids, @@ -311,6 +312,7 @@ class FlashCausalLMBatch(Batch): return FlashCausalLMBatch( batch_id=batches[0].batch_id, + past_pad=batches[0].past_pad, requests=requests, requests_idx_mapping=requests_idx_mapping, input_ids=input_ids,