mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-07-29 11:20:16 +00:00
fix: prefer default dtype
This commit is contained in:
parent
7ab99bc6b3
commit
eef3c7bdf2
@ -1362,7 +1362,8 @@ def get_model(
|
||||
revision=revision,
|
||||
quantize=quantize,
|
||||
speculator=speculator,
|
||||
dtype=torch.bfloat16,
|
||||
dtype=dtype,
|
||||
default_dtype=torch.bfloat16,
|
||||
kv_cache_dtype=kv_cache_dtype,
|
||||
trust_remote_code=trust_remote_code,
|
||||
lora_adapter_ids=lora_adapter_ids,
|
||||
|
Loading…
Reference in New Issue
Block a user