mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-05-01 23:12:09 +00:00
fix(server): Fixing non parameters in quantize script bigcode/starcoder
was an example. (#661)
This commit is contained in:
parent
362883f259
commit
08b8eec1d7
@ -812,10 +812,13 @@ def load_weights_pre_hook(module_name, weights, recursive=False):
|
|||||||
tensor = weights.get_tensor(tensor_name)
|
tensor = weights.get_tensor(tensor_name)
|
||||||
setdeepattr(module, local_param, nn.Parameter(tensor))
|
setdeepattr(module, local_param, nn.Parameter(tensor))
|
||||||
else:
|
else:
|
||||||
|
tensor = current_tensor.to(device=torch.device("cuda:0"))
|
||||||
|
if current_tensor.requires_grad:
|
||||||
|
tensor = nn.Parameter(tensor)
|
||||||
setdeepattr(
|
setdeepattr(
|
||||||
module,
|
module,
|
||||||
local_param,
|
local_param,
|
||||||
nn.Parameter(current_tensor.to(device=torch.device("cuda:0"))),
|
tensor
|
||||||
)
|
)
|
||||||
|
|
||||||
return inner
|
return inner
|
||||||
|
Loading…
Reference in New Issue
Block a user