Shorter diff.

This commit is contained in:
Nicolas Patry 2024-07-23 12:59:35 +00:00
parent ab62312d8c
commit 32cc60f329
No known key found for this signature in database
GPG Key ID: B154A218C20EBBCA

View File

@ -120,7 +120,7 @@ class MistralAttention(torch.nn.Module):
if hasattr(config, "head_dim"): if hasattr(config, "head_dim"):
self.head_size = config.head_dim self.head_size = config.head_dim
else: else:
self.head_size = hidden_size // num_attention_heads self.head_size = self.hidden_size // self.num_heads
self.rotary_emb = PositionRotaryEmbedding.static( self.rotary_emb = PositionRotaryEmbedding.static(
config=config, config=config,