mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-22 23:42:06 +00:00
fix: fix logic if sliding window key is not present in config (#1352)
This commit is contained in:
parent
a95e6d603d
commit
ecb0db45af
@ -60,7 +60,7 @@ class MistralConfig(PretrainedConfig):
|
|||||||
pretraining_tp=1,
|
pretraining_tp=1,
|
||||||
tie_word_embeddings=False,
|
tie_word_embeddings=False,
|
||||||
rope_theta=10000.0,
|
rope_theta=10000.0,
|
||||||
sliding_window=4096,
|
sliding_window=None,
|
||||||
**kwargs,
|
**kwargs,
|
||||||
):
|
):
|
||||||
self.vocab_size = vocab_size
|
self.vocab_size = vocab_size
|
||||||
|
@ -72,7 +72,7 @@ class MixtralConfig(PretrainedConfig):
|
|||||||
pretraining_tp=1,
|
pretraining_tp=1,
|
||||||
tie_word_embeddings=False,
|
tie_word_embeddings=False,
|
||||||
rope_theta=10000.0,
|
rope_theta=10000.0,
|
||||||
sliding_window=4096,
|
sliding_window=None,
|
||||||
num_experts_per_tok=2,
|
num_experts_per_tok=2,
|
||||||
num_local_experts=8,
|
num_local_experts=8,
|
||||||
**kwargs,
|
**kwargs,
|
||||||
|
Loading…
Reference in New Issue
Block a user