mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-24 16:32:12 +00:00
fix: slice stopping criteria buffer
This commit is contained in:
parent
b3c2d7291e
commit
04dbf7a506
@ -109,7 +109,7 @@ class StoppingCriteria:
|
||||
self.stop_sequence_criterias = stop_sequence_criterias
|
||||
self.max_new_tokens = max_new_tokens
|
||||
self.current_tokens = 0
|
||||
self.current_output = ""
|
||||
self.current_output = "test"
|
||||
self.ignore_eos_token = ignore_eos_token
|
||||
|
||||
def __call__(self, last_token: int, last_output: str) -> Tuple[bool, Optional[str]]:
|
||||
@ -121,6 +121,10 @@ class StoppingCriteria:
|
||||
return True, FinishReason.FINISH_REASON_EOS_TOKEN
|
||||
|
||||
self.current_output += last_output
|
||||
# There is no need to keep an output that is too long
|
||||
if len(self.current_output) > 300:
|
||||
# Slice to -200 to avoid doing it all the time
|
||||
self.current_output = self.current_output[-200:]
|
||||
for stop_sequence_criteria in self.stop_sequence_criterias:
|
||||
if stop_sequence_criteria(self.current_output):
|
||||
return True, FinishReason.FINISH_REASON_STOP_SEQUENCE
|
||||
|
Loading…
Reference in New Issue
Block a user