mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 20:34:54 +00:00
fix kernel
This commit is contained in:
parent
d1e95ceaff
commit
347f3f51da
@ -229,11 +229,7 @@ def triton_copy_next_input_ids_inplace(
|
|||||||
|
|
||||||
# Store in all_input_ids, since it is a 2D tensor, apply stride * bid
|
# Store in all_input_ids, since it is a 2D tensor, apply stride * bid
|
||||||
tl.store(
|
tl.store(
|
||||||
all_input_ids_ptr
|
all_input_ids_ptr + stride_all_input_ids * bid + cache_length + block_arange,
|
||||||
+ stride_all_input_ids * bid
|
|
||||||
+ cache_length
|
|
||||||
+ input_length
|
|
||||||
+ block_arange,
|
|
||||||
next_input_ids,
|
next_input_ids,
|
||||||
mask=mask,
|
mask=mask,
|
||||||
)
|
)
|
||||||
|
Loading…
Reference in New Issue
Block a user