mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-09 19:34:53 +00:00
minor fix
Signed-off-by: Wang, Yi A <yi.a.wang@intel.com>
This commit is contained in:
parent
7c8694545f
commit
6382b4261c
@ -51,9 +51,8 @@ class LoraLinear(nn.Module):
|
|||||||
return result
|
return result
|
||||||
data: Optional["BatchLoraWeights"] = adapter_data.data.get(layer_type)
|
data: Optional["BatchLoraWeights"] = adapter_data.data.get(layer_type)
|
||||||
|
|
||||||
if (
|
if data is not None and (
|
||||||
data is not None
|
SYSTEM == "ipex"
|
||||||
and SYSTEM == "ipex"
|
|
||||||
or (punica_sgmv is not None and data.can_vectorize(self.process_group))
|
or (punica_sgmv is not None and data.can_vectorize(self.process_group))
|
||||||
):
|
):
|
||||||
# In tensor-parallel configurations, each GPU processes a specific segment of the output.
|
# In tensor-parallel configurations, each GPU processes a specific segment of the output.
|
||||||
|
Loading…
Reference in New Issue
Block a user