mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 20:34:54 +00:00
Fix Phi-2 with tp>1
We were using the wrong parallelism in the up-projection.
This commit is contained in:
parent
df71aafdcc
commit
f9c354d120
@ -238,7 +238,7 @@ class PhiMLP(nn.Module):
|
||||
)
|
||||
|
||||
# llama weights are up_proj and down_proj and bias=False
|
||||
self.up_proj = TensorParallelRowLinear.load(
|
||||
self.up_proj = TensorParallelColumnLinear.load(
|
||||
config,
|
||||
prefix=f"{prefix}.fc1",
|
||||
weights=weights,
|
||||
|
Loading…
Reference in New Issue
Block a user