mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-10 20:04:52 +00:00
fix drop
This commit is contained in:
parent
8ec0edcfe3
commit
3c4243d627
@ -640,6 +640,10 @@ class FlashCausalLMBatch(Batch):
|
|||||||
device=batches[0].next_token_chooser.device,
|
device=batches[0].next_token_chooser.device,
|
||||||
)
|
)
|
||||||
|
|
||||||
|
# Needed to avoid dropping blocks when the batches will go out of scope
|
||||||
|
for b in batches:
|
||||||
|
b.block_tables = None
|
||||||
|
|
||||||
return FlashCausalLMBatch(
|
return FlashCausalLMBatch(
|
||||||
batch_id=batches[0].batch_id,
|
batch_id=batches[0].batch_id,
|
||||||
requests=requests,
|
requests=requests,
|
||||||
|
Loading…
Reference in New Issue
Block a user