mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-21 23:12:07 +00:00
disable _custom_C.LLMM1 as it is broken for TP>=2
This commit is contained in:
parent
562cd4b06e
commit
81c27ba9c2
@ -355,7 +355,8 @@ class FastLinearROCm(nn.Module):
|
|||||||
weight = self.weight
|
weight = self.weight
|
||||||
bias = self.bias
|
bias = self.bias
|
||||||
|
|
||||||
if IS_ROCM_SYSTEM and inp.numel() // inp.size(-1) == 1:
|
# TODO: fix for TP>=2, this only works for TP=1
|
||||||
|
if False and IS_ROCM_SYSTEM and inp.numel() // inp.size(-1) == 1:
|
||||||
batched = False
|
batched = False
|
||||||
|
|
||||||
if inp.dim() == 3:
|
if inp.dim() == 3:
|
||||||
|
Loading…
Reference in New Issue
Block a user