Do not convert weight scale to e4m3fnuz on CUDA (#2917)

This commit is contained in:
Daniël de Kok 2025-01-16 13:44:32 +01:00 committed by GitHub
parent 922cc38fbc
commit 5f78ec32a5
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -147,7 +147,7 @@ class W8ANFpLoader(WeightsLoader):
else None
)
if self.load_weight_scale or SYSTEM == "rocm":
if self.load_weight_scale and SYSTEM == "rocm":
w, weight_scale, input_scale = normalize_e4m3fn_to_e4m3fnuz(
w, weight_scale, input_scale
)