mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-06-19 15:52:08 +00:00
Black
This commit is contained in:
parent
9dbaa176fd
commit
1acc96c82a
@ -1798,7 +1798,9 @@ class FlashCausalLM(Model):
|
|||||||
total_batch_seq = 0.001
|
total_batch_seq = 0.001
|
||||||
total_mem = 0
|
total_mem = 0
|
||||||
available_mem = free_mem - self.mem_reserved
|
available_mem = free_mem - self.mem_reserved
|
||||||
log_master(logger.info, f"Decode batch size list:{[bsz[0] for bsz in buckets]}\n")
|
log_master(
|
||||||
|
logger.info, f"Decode batch size list:{[bsz[0] for bsz in buckets]}\n"
|
||||||
|
)
|
||||||
for i, (batch_size, block_num) in enumerate(buckets):
|
for i, (batch_size, block_num) in enumerate(buckets):
|
||||||
if batch_size > block_num:
|
if batch_size > block_num:
|
||||||
continue
|
continue
|
||||||
|
@ -822,7 +822,9 @@ class FlashVlmCausalLM(FlashCausalLM):
|
|||||||
total_batch_seq = 0.001
|
total_batch_seq = 0.001
|
||||||
total_mem = 0
|
total_mem = 0
|
||||||
available_mem = decode_available_memory
|
available_mem = decode_available_memory
|
||||||
log_master(logger.info, f"Decode batch size list:{[bsz[0] for bsz in buckets]}\n")
|
log_master(
|
||||||
|
logger.info, f"Decode batch size list:{[bsz[0] for bsz in buckets]}\n"
|
||||||
|
)
|
||||||
for i, (batch_size, block_num) in enumerate(buckets):
|
for i, (batch_size, block_num) in enumerate(buckets):
|
||||||
if batch_size > block_num:
|
if batch_size > block_num:
|
||||||
continue
|
continue
|
||||||
|
@ -442,7 +442,9 @@ class FlashMllamaCausalLM(FlashVlmCausalLM):
|
|||||||
total_batch_seq = 0.001
|
total_batch_seq = 0.001
|
||||||
total_mem = 0
|
total_mem = 0
|
||||||
available_mem = free_mem - self.mem_reserved
|
available_mem = free_mem - self.mem_reserved
|
||||||
log_master(logger.info, f"Decode batch size list:{[bsz[0] for bsz in buckets]}\n")
|
log_master(
|
||||||
|
logger.info, f"Decode batch size list:{[bsz[0] for bsz in buckets]}\n"
|
||||||
|
)
|
||||||
for i, (batch_size, block_num) in enumerate(buckets):
|
for i, (batch_size, block_num) in enumerate(buckets):
|
||||||
if batch_size > block_num:
|
if batch_size > block_num:
|
||||||
continue
|
continue
|
||||||
|
@ -8,7 +8,7 @@ import torch
|
|||||||
|
|
||||||
|
|
||||||
def find_segments(
|
def find_segments(
|
||||||
adapter_indices: Union[torch.Tensor, List[int]]
|
adapter_indices: Union[torch.Tensor, List[int]],
|
||||||
) -> Tuple[List[int], List[int]]:
|
) -> Tuple[List[int], List[int]]:
|
||||||
segments = [0]
|
segments = [0]
|
||||||
segment_indices = []
|
segment_indices = []
|
||||||
|
Loading…
Reference in New Issue
Block a user