mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-12 04:44:52 +00:00
Important line got squashed.
This commit is contained in:
parent
aac91d1d26
commit
7b13fede50
@ -1520,6 +1520,10 @@ class FlashCausalLM(Model):
|
|||||||
)
|
)
|
||||||
# assert block_tables.shape[0] >= slots.shape[0]
|
# assert block_tables.shape[0] >= slots.shape[0]
|
||||||
cuda_graph["block_tables"][: block_tables.shape[0]] = block_tables
|
cuda_graph["block_tables"][: block_tables.shape[0]] = block_tables
|
||||||
|
else:
|
||||||
|
cuda_graph["block_tables"][
|
||||||
|
: block_tables.shape[0], : block_tables.shape[1]
|
||||||
|
] = block_tables
|
||||||
|
|
||||||
# XXX: This is working only because block 0 is reserved for the healthcheck
|
# XXX: This is working only because block 0 is reserved for the healthcheck
|
||||||
# so it doesn't matter if we override it with bogus values.
|
# so it doesn't matter if we override it with bogus values.
|
||||||
|
Loading…
Reference in New Issue
Block a user