mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-12 04:44:52 +00:00
Medusa requires reshaping.
This commit is contained in:
parent
99b6b5c795
commit
4fff77ebcb
@ -1412,7 +1412,7 @@ class FlashCausalLM(Model):
|
||||
).view(-1)
|
||||
prefix_lens_tensor = (
|
||||
batch.prefix_lens_tensor.unsqueeze(-1).expand(B, new_length)
|
||||
).view(-1)
|
||||
).reshape(-1)
|
||||
|
||||
# Add Copy the block tables for all members
|
||||
block_tables = (
|
||||
|
Loading…
Reference in New Issue
Block a user