mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-07-29 19:30:16 +00:00
fix: prefer default dtype
This commit is contained in:
parent
7ab99bc6b3
commit
eef3c7bdf2
@ -1362,7 +1362,8 @@ def get_model(
|
|||||||
revision=revision,
|
revision=revision,
|
||||||
quantize=quantize,
|
quantize=quantize,
|
||||||
speculator=speculator,
|
speculator=speculator,
|
||||||
dtype=torch.bfloat16,
|
dtype=dtype,
|
||||||
|
default_dtype=torch.bfloat16,
|
||||||
kv_cache_dtype=kv_cache_dtype,
|
kv_cache_dtype=kv_cache_dtype,
|
||||||
trust_remote_code=trust_remote_code,
|
trust_remote_code=trust_remote_code,
|
||||||
lora_adapter_ids=lora_adapter_ids,
|
lora_adapter_ids=lora_adapter_ids,
|
||||||
|
Loading…
Reference in New Issue
Block a user