mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 20:34:54 +00:00
Fix Phi-2 with tp>1
We were using the wrong parallelism in the up-projection.
This commit is contained in:
parent
df71aafdcc
commit
f9c354d120
@ -238,7 +238,7 @@ class PhiMLP(nn.Module):
|
|||||||
)
|
)
|
||||||
|
|
||||||
# llama weights are up_proj and down_proj and bias=False
|
# llama weights are up_proj and down_proj and bias=False
|
||||||
self.up_proj = TensorParallelRowLinear.load(
|
self.up_proj = TensorParallelColumnLinear.load(
|
||||||
config,
|
config,
|
||||||
prefix=f"{prefix}.fc1",
|
prefix=f"{prefix}.fc1",
|
||||||
weights=weights,
|
weights=weights,
|
||||||
|
Loading…
Reference in New Issue
Block a user