mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-21 14:52:20 +00:00
Neox.
This commit is contained in:
parent
3fb8979a6d
commit
dadbbc27d5
@ -58,7 +58,7 @@ def load_row(config, prefix: str, weights, bias: bool):
|
||||
|
||||
|
||||
def load_qkv(config, prefix: str, weights, num_heads, head_size, hidden_size):
|
||||
weight = weights.get_multi_weights_col([prefix], quantize=config.quantize)
|
||||
weight = weights.get_multi_weights_col([prefix], quantize=config.quantize, dim=0)
|
||||
if isinstance(weight, torch.Tensor):
|
||||
# Only on non quantized versions
|
||||
weight = (
|
||||
|
Loading…
Reference in New Issue
Block a user