add improvements

This commit is contained in:
Mohit Sharma 2025-04-21 15:28:18 +00:00
parent be8e60a918
commit 6ed540b52f

View File

@ -1346,6 +1346,9 @@ class FlashCausalLM(Model):
def batch_type(self) -> Type[FlashCausalLMBatch]:
return FlashCausalLMBatch
def get_input_embeddings(self, batch):
batch.inputs_embeds = None
def init_kv_cache(
self,
num_blocks: int,