mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-10 03:44:54 +00:00
add improvements
This commit is contained in:
parent
be8e60a918
commit
6ed540b52f
@ -1346,6 +1346,9 @@ class FlashCausalLM(Model):
|
|||||||
def batch_type(self) -> Type[FlashCausalLMBatch]:
|
def batch_type(self) -> Type[FlashCausalLMBatch]:
|
||||||
return FlashCausalLMBatch
|
return FlashCausalLMBatch
|
||||||
|
|
||||||
|
def get_input_embeddings(self, batch):
|
||||||
|
batch.inputs_embeds = None
|
||||||
|
|
||||||
def init_kv_cache(
|
def init_kv_cache(
|
||||||
self,
|
self,
|
||||||
num_blocks: int,
|
num_blocks: int,
|
||||||
|
Loading…
Reference in New Issue
Block a user