fix logits processor

2025-09-11 12:24:53 +00:00 · 2024-02-08 12:49:24 +01:00 · 2024-02-08 12:49:24 +01:00 · cfacf91af8
commit cfacf91af8
parent 75b492d720
1 changed files with 2 additions and 2 deletions
--- a/server/text_generation_server/utils/logits_process.py
+++ b/server/text_generation_server/utils/logits_process.py
@ -136,10 +136,10 @@ class FrequencyPenaltyLogitsProcessor(LogitsProcessor):
        score = torch.gather(scores, 1, input_ids)
        # if score < 0 then penalty has to be multiplied to reduce the previous token probability
        score = -torch.where(
-            score < 0, score * self.penalty_tensor, score / self.penalty_tensor
+            score < 0, score * self.penalty, score / self.penalty
        )
-        return scores - torch.scatter(scores, 1, input_ids, score)
+        return scores.scatter_add_(1, input_ids, score)
 class HeterogeneousFrequencyPenaltyLogitsProcessor(LogitsProcessor):