mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-21 23:12:07 +00:00
Do not convert weight scale to e4m3fnuz on CUDA (#2917)
This commit is contained in:
parent
922cc38fbc
commit
5f78ec32a5
@ -147,7 +147,7 @@ class W8ANFpLoader(WeightsLoader):
|
|||||||
else None
|
else None
|
||||||
)
|
)
|
||||||
|
|
||||||
if self.load_weight_scale or SYSTEM == "rocm":
|
if self.load_weight_scale and SYSTEM == "rocm":
|
||||||
w, weight_scale, input_scale = normalize_e4m3fn_to_e4m3fnuz(
|
w, weight_scale, input_scale = normalize_e4m3fn_to_e4m3fnuz(
|
||||||
w, weight_scale, input_scale
|
w, weight_scale, input_scale
|
||||||
)
|
)
|
||||||
|
Loading…
Reference in New Issue
Block a user