From 783bc64f4799bab77ee24f1c72d5a674dc1551c0 Mon Sep 17 00:00:00 2001
From: OlivierDehaene <23298448+OlivierDehaene@users.noreply.github.com>
Date: Tue, 4 Apr 2023 18:54:10 +0200
Subject: [PATCH] fix concatenate

---
 server/text_generation_server/models/flash_causal_lm.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/server/text_generation_server/models/flash_causal_lm.py b/server/text_generation_server/models/flash_causal_lm.py
index ef28ac4d..5f0e46da 100644
--- a/server/text_generation_server/models/flash_causal_lm.py
+++ b/server/text_generation_server/models/flash_causal_lm.py
@@ -188,6 +188,7 @@ class FlashCausalLMBatch(Batch):
             max_seqlen=max_seqlen,
             past_key_values=past_key_values,
             input_lengths=input_lengths,
+            offsets=offsets,
             all_input_ids=all_input_ids,
             all_input_ids_tensor=all_input_ids_tensor,
             next_token_choosers=next_token_choosers,