mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 20:34:54 +00:00
Add default to Gemma Causality.
This commit is contained in:
parent
fc5bfa070a
commit
425f348e48
@ -162,7 +162,7 @@ def _load_gqa(config, prefix: str, weights):
|
||||
|
||||
|
||||
class FlashGemmaAttention(torch.nn.Module):
|
||||
def __init__(self, prefix: str, config, weights, causal: bool):
|
||||
def __init__(self, prefix: str, config, weights, causal: bool = True):
|
||||
super().__init__()
|
||||
self.num_heads = config.num_attention_heads
|
||||
self.head_size = config.head_dim
|
||||
|
Loading…
Reference in New Issue
Block a user