mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-12 04:44:52 +00:00
Fix GPTQ autotune data type to be compatible with Torch 2.4.0
This commit is contained in:
parent
26614057a7
commit
fa9221f28d
@ -91,7 +91,7 @@ class Autotuner(triton.KernelInterface):
|
||||
kernel_call, quantiles=(0.5, 0.2, 0.8), rep=40
|
||||
)
|
||||
except triton.OutOfResources:
|
||||
return (float("inf"), float("inf"), float("inf"))
|
||||
return [float("inf"), float("inf"), float("inf")]
|
||||
|
||||
def run(self, *args, **kwargs):
|
||||
self.nargs = dict(zip(self.arg_names, args))
|
||||
|
Loading…
Reference in New Issue
Block a user