mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 20:34:54 +00:00
fix kernel
This commit is contained in:
parent
d1e95ceaff
commit
347f3f51da
@ -229,11 +229,7 @@ def triton_copy_next_input_ids_inplace(
|
||||
|
||||
# Store in all_input_ids, since it is a 2D tensor, apply stride * bid
|
||||
tl.store(
|
||||
all_input_ids_ptr
|
||||
+ stride_all_input_ids * bid
|
||||
+ cache_length
|
||||
+ input_length
|
||||
+ block_arange,
|
||||
all_input_ids_ptr + stride_all_input_ids * bid + cache_length + block_arange,
|
||||
next_input_ids,
|
||||
mask=mask,
|
||||
)
|
||||
|
Loading…
Reference in New Issue
Block a user