mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-12 04:44:52 +00:00
revert default dtype
This commit is contained in:
parent
0d68619efa
commit
6d8e3659a9
@ -334,13 +334,6 @@ def get_model(
|
||||
if FBGEMM_DYN_AVAILABLE:
|
||||
# fbgemm kernels are fp8xfp8->bf16
|
||||
dtype = torch.bfloat16
|
||||
else:
|
||||
config_dtype = config_dict.get("torch_dtype", None)
|
||||
# Only use the config dtype if its one of TGI's supported dtype
|
||||
if config_dtype == "float16":
|
||||
dtype = torch.float16
|
||||
elif config_dtype == "bfloat16":
|
||||
dtype = torch.bfloat16
|
||||
else:
|
||||
# Keep it as default for now and let
|
||||
# every model resolve their own default dtype.
|
||||
|
Loading…
Reference in New Issue
Block a user