mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-19 13:52:07 +00:00
Fix state.plan call to use positional arguments
This commit is contained in:
parent
9a8d0462e1
commit
fd92054e1d
@ -84,16 +84,16 @@ def use_prefill_with_paged_kv_state(
|
|||||||
token = prefill_with_paged_kv_state.set(state)
|
token = prefill_with_paged_kv_state.set(state)
|
||||||
try:
|
try:
|
||||||
state.plan(
|
state.plan(
|
||||||
qo_indptr=cu_seqlens,
|
cu_seqlens,
|
||||||
paged_kv_indptr=indptr,
|
indptr,
|
||||||
paged_kv_indices=block_tables,
|
block_tables,
|
||||||
paged_kv_last_page_len=last_page_len,
|
last_page_len,
|
||||||
num_qo_heads=num_heads,
|
num_heads,
|
||||||
num_kv_heads=num_kv_heads,
|
num_kv_heads,
|
||||||
head_dim=head_size,
|
head_size,
|
||||||
kv_data_type=kv_dtype,
|
page_size,
|
||||||
q_data_type=q_dtype,
|
q_data_type=q_dtype,
|
||||||
page_size=page_size,
|
kv_data_type=kv_dtype,
|
||||||
)
|
)
|
||||||
yield
|
yield
|
||||||
finally:
|
finally:
|
||||||
|
Loading…
Reference in New Issue
Block a user