mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-08 19:04:52 +00:00
minor fix
Signed-off-by: Wang, Yi A <yi.a.wang@intel.com>
This commit is contained in:
parent
7c8694545f
commit
6382b4261c
@ -51,9 +51,8 @@ class LoraLinear(nn.Module):
|
||||
return result
|
||||
data: Optional["BatchLoraWeights"] = adapter_data.data.get(layer_type)
|
||||
|
||||
if (
|
||||
data is not None
|
||||
and SYSTEM == "ipex"
|
||||
if data is not None and (
|
||||
SYSTEM == "ipex"
|
||||
or (punica_sgmv is not None and data.can_vectorize(self.process_group))
|
||||
):
|
||||
# In tensor-parallel configurations, each GPU processes a specific segment of the output.
|
||||
|
Loading…
Reference in New Issue
Block a user