Attempting to fix torch leak.

2025-09-17 23:34:52 +00:00 · 2023-08-12 09:06:49 +02:00 · 2023-08-12 09:06:49 +02:00 · 89a4e723d2
commit 89a4e723d2
parent a2a913eec5
1 changed files with 1 additions and 0 deletions
--- a/server/text_generation_server/models/causal_lm.py
+++ b/server/text_generation_server/models/causal_lm.py
@ -659,6 +659,7 @@ class CausalLM(Model):

        # We finished all generations in the batch; there is no next batch
        if stopped:
+            torch.cuda.empty_cache()
            return generations, None

        # Slice unused values from prefill