fix: fix logic if sliding window key is not present in config (#1352)

This commit is contained in:
OlivierDehaene 2023-12-15 14:56:17 +01:00 committed by Karol Damaszke
parent a95e6d603d
commit ecb0db45af
2 changed files with 2 additions and 2 deletions

View File

@ -60,7 +60,7 @@ class MistralConfig(PretrainedConfig):
pretraining_tp=1,
tie_word_embeddings=False,
rope_theta=10000.0,
sliding_window=4096,
sliding_window=None,
**kwargs,
):
self.vocab_size = vocab_size

View File

@ -72,7 +72,7 @@ class MixtralConfig(PretrainedConfig):
pretraining_tp=1,
tie_word_embeddings=False,
rope_theta=10000.0,
sliding_window=4096,
sliding_window=None,
num_experts_per_tok=2,
num_local_experts=8,
**kwargs,