mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-12 12:54:52 +00:00
Medusa requires reshaping.
This commit is contained in:
parent
99b6b5c795
commit
4fff77ebcb
@ -1412,7 +1412,7 @@ class FlashCausalLM(Model):
|
|||||||
).view(-1)
|
).view(-1)
|
||||||
prefix_lens_tensor = (
|
prefix_lens_tensor = (
|
||||||
batch.prefix_lens_tensor.unsqueeze(-1).expand(B, new_length)
|
batch.prefix_lens_tensor.unsqueeze(-1).expand(B, new_length)
|
||||||
).view(-1)
|
).reshape(-1)
|
||||||
|
|
||||||
# Add Copy the block tables for all members
|
# Add Copy the block tables for all members
|
||||||
block_tables = (
|
block_tables = (
|
||||||
|
Loading…
Reference in New Issue
Block a user