mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-19 13:52:07 +00:00
flashinfer: head_dim -> head_dim_qk
This commit is contained in:
parent
e893362ad7
commit
3d71c06aff
@ -90,7 +90,7 @@ def use_prefill_with_paged_kv_state(
|
||||
paged_kv_last_page_len=last_page_len,
|
||||
num_qo_heads=num_heads,
|
||||
num_kv_heads=num_kv_heads,
|
||||
head_dim=head_size,
|
||||
head_dim_qk=head_size,
|
||||
kv_data_type=kv_dtype,
|
||||
q_data_type=q_dtype,
|
||||
page_size=page_size,
|
||||
|
Loading…
Reference in New Issue
Block a user