kv scale in pageattn

Signed-off-by: Wang, Yi A <yi.a.wang@intel.com>
This commit is contained in:
Wang, Yi A 2025-04-07 22:47:11 -07:00
parent d9e47b651c
commit ad15a9c0af

View File

@ -143,6 +143,8 @@ def paged_attention(
BLOCK_SIZE,
max_s,
None,
k_scale=kv_scales.key_scale_cpu,
v_scale=kv_scales.value_scale_cpu,
)
return out