This commit is contained in:
OlivierDehaene 2023-06-30 16:52:25 +02:00
parent 8ec0edcfe3
commit 3c4243d627

View File

@ -640,6 +640,10 @@ class FlashCausalLMBatch(Batch):
device=batches[0].next_token_chooser.device, device=batches[0].next_token_chooser.device,
) )
# Needed to avoid dropping blocks when the batches will go out of scope
for b in batches:
b.block_tables = None
return FlashCausalLMBatch( return FlashCausalLMBatch(
batch_id=batches[0].batch_id, batch_id=batches[0].batch_id,
requests=requests, requests=requests,