mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-21 23:12:07 +00:00
disable _custom_C.LLMM1 as it is broken for TP>=2
This commit is contained in:
parent
562cd4b06e
commit
81c27ba9c2
@ -355,7 +355,8 @@ class FastLinearROCm(nn.Module):
|
||||
weight = self.weight
|
||||
bias = self.bias
|
||||
|
||||
if IS_ROCM_SYSTEM and inp.numel() // inp.size(-1) == 1:
|
||||
# TODO: fix for TP>=2, this only works for TP=1
|
||||
if False and IS_ROCM_SYSTEM and inp.numel() // inp.size(-1) == 1:
|
||||
batched = False
|
||||
|
||||
if inp.dim() == 3:
|
||||
|
Loading…
Reference in New Issue
Block a user