mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 20:34:54 +00:00
cast to int32
This commit is contained in:
parent
ea66379e3c
commit
d1e95ceaff
@ -945,7 +945,7 @@ class FlashCausalLMBatch(Batch):
|
||||
)
|
||||
self.cu_seqlen_prefill = torch.nn.functional.pad(
|
||||
torch.cumsum(self.input_lengths_tensor, dim=0), (1, 0)
|
||||
)
|
||||
).to(torch.int32)
|
||||
self.cache_lengths_tensor = torch.tensor(
|
||||
self.cache_lengths, dtype=torch.int32, device=device
|
||||
)
|
||||
|
Loading…
Reference in New Issue
Block a user