mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-10 20:04:52 +00:00
Fixing Idefics dtype.
This commit is contained in:
parent
861acdeab1
commit
a8da815b81
@ -583,7 +583,7 @@ class IdeficsCausalLM(Model):
|
||||
|
||||
if torch.cuda.is_available():
|
||||
device = torch.device("cuda")
|
||||
dtype = torch.float16 if dtype is None else dtype
|
||||
dtype = torch.bfloat16 if dtype is None else dtype
|
||||
else:
|
||||
if quantize:
|
||||
raise ValueError("quantization is not available on CPU")
|
||||
|
Loading…
Reference in New Issue
Block a user