mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-10 11:54:52 +00:00
fix drop
This commit is contained in:
parent
8ec0edcfe3
commit
3c4243d627
@ -640,6 +640,10 @@ class FlashCausalLMBatch(Batch):
|
||||
device=batches[0].next_token_chooser.device,
|
||||
)
|
||||
|
||||
# Needed to avoid dropping blocks when the batches will go out of scope
|
||||
for b in batches:
|
||||
b.block_tables = None
|
||||
|
||||
return FlashCausalLMBatch(
|
||||
batch_id=batches[0].batch_id,
|
||||
requests=requests,
|
||||
|
Loading…
Reference in New Issue
Block a user