mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 20:34:54 +00:00
cast to int32
This commit is contained in:
parent
ea66379e3c
commit
d1e95ceaff
@ -945,7 +945,7 @@ class FlashCausalLMBatch(Batch):
|
|||||||
)
|
)
|
||||||
self.cu_seqlen_prefill = torch.nn.functional.pad(
|
self.cu_seqlen_prefill = torch.nn.functional.pad(
|
||||||
torch.cumsum(self.input_lengths_tensor, dim=0), (1, 0)
|
torch.cumsum(self.input_lengths_tensor, dim=0), (1, 0)
|
||||||
)
|
).to(torch.int32)
|
||||||
self.cache_lengths_tensor = torch.tensor(
|
self.cache_lengths_tensor = torch.tensor(
|
||||||
self.cache_lengths, dtype=torch.int32, device=device
|
self.cache_lengths, dtype=torch.int32, device=device
|
||||||
)
|
)
|
||||||
|
Loading…
Reference in New Issue
Block a user