Do not convert weight scale to e4m3fnuz on CUDA

This commit is contained in:
Daniël de Kok 2025-01-16 11:06:11 +00:00
parent 922cc38fbc
commit f951a8b48d

View File

@ -147,7 +147,7 @@ class W8ANFpLoader(WeightsLoader):
else None else None
) )
if self.load_weight_scale or SYSTEM == "rocm": if self.load_weight_scale and SYSTEM == "rocm":
w, weight_scale, input_scale = normalize_e4m3fn_to_e4m3fnuz( w, weight_scale, input_scale = normalize_e4m3fn_to_e4m3fnuz(
w, weight_scale, input_scale w, weight_scale, input_scale
) )