From d99f281050e4d39ceff711b0b0cddeec32fada23 Mon Sep 17 00:00:00 2001
From: Nicolas Patry <patry.nicolas@protonmail.com>
Date: Mon, 4 Dec 2023 14:43:29 +0000
Subject: [PATCH] Remove pdb comments.

---
 .../text_generation_server/models/flash_causal_lm.py | 12 ------------
 server/text_generation_server/utils/tokens.py        |  2 --
 2 files changed, 14 deletions(-)

diff --git a/server/text_generation_server/models/flash_causal_lm.py b/server/text_generation_server/models/flash_causal_lm.py
index 952068ec..de946d21 100644
--- a/server/text_generation_server/models/flash_causal_lm.py
+++ b/server/text_generation_server/models/flash_causal_lm.py
@@ -825,8 +825,6 @@ class FlashCausalLM(Model):
             next_token_logits = out
 
 
-        # if next_token_logits.shape[0] == 3:
-        #     import ipdb;ipdb.set_trace()
         from text_generation_server.models import SPECULATE
         next_input_ids, next_token_logprobs, logprobs, accepted_ids, speculative_ids = batch.next_token_chooser(
             batch.all_input_ids_tensor[:, : batch.max_seqlen], next_token_logits, SPECULATE, batch.speculative_ids, speculative_logits
@@ -850,7 +848,6 @@ class FlashCausalLM(Model):
             batch.cu_seqlen_prefill = None
         else:
             prefill_logprobs = None
-            # import ipdb;ipdb.set_trace()
             next_position_ids = batch.position_ids
 
         # Cumulative length
@@ -912,15 +909,6 @@ class FlashCausalLM(Model):
             cumulative_length += input_length
 
 
-        # if accepted_ids[0] > 1:
-        #     import ipdb;ipdb.set_trace()
-
-        # if len(accepted_ids) > 1:
-        #     raise Exception("Implemtent the batched behavior")
-
-        # Set values in batch
-        # batch.input_ids = torch.cat([next_input_ids.unsqueeze(-1), speculative_ids], dim=1).view(-1)
-        
         batch.input_ids = next_input_ids[accepted_ids.cumsum(dim=-1) - 1]
         batch.speculative_ids = speculative_ids
         batch.position_ids = next_position_ids + accepted_ids
diff --git a/server/text_generation_server/utils/tokens.py b/server/text_generation_server/utils/tokens.py
index 4c77b660..d5a703c8 100644
--- a/server/text_generation_server/utils/tokens.py
+++ b/server/text_generation_server/utils/tokens.py
@@ -308,8 +308,6 @@ class HeterogeneousNextTokenChooser:
                         break
                 accepted_ids.append(accepted)
 
-            from loguru import logger
-            logger.info(f"ACCEPTED IDS {accepted_ids}")
             accepted_ids = torch.tensor(accepted_ids, device=input_ids.device, dtype=input_ids.dtype)
             next_ids = next_ids[indices]
             scores = scores[indices]