mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 04:14:52 +00:00
rebase
This commit is contained in:
parent
66238a1c94
commit
e55870b03e
@ -152,7 +152,6 @@ def get_model(
|
|||||||
use_medusa = None
|
use_medusa = None
|
||||||
if "medusa_num_heads" in config_dict:
|
if "medusa_num_heads" in config_dict:
|
||||||
use_medusa = model_id
|
use_medusa = model_id
|
||||||
medusa_config = config_dict
|
|
||||||
model_id = config_dict["base_model_name_or_path"]
|
model_id = config_dict["base_model_name_or_path"]
|
||||||
revision = "main"
|
revision = "main"
|
||||||
speculate_medusa = config_dict["medusa_num_heads"]
|
speculate_medusa = config_dict["medusa_num_heads"]
|
||||||
@ -298,7 +297,6 @@ def get_model(
|
|||||||
if MISTRAL:
|
if MISTRAL:
|
||||||
return FlashMistral(
|
return FlashMistral(
|
||||||
model_id,
|
model_id,
|
||||||
config_dict.get("architectures", []),
|
|
||||||
revision,
|
revision,
|
||||||
quantize=quantize,
|
quantize=quantize,
|
||||||
dtype=dtype,
|
dtype=dtype,
|
||||||
|
Loading…
Reference in New Issue
Block a user