mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-21 06:42:10 +00:00
Update transformers_flash_causal_lm.py
This commit is contained in:
parent
de83178bc3
commit
bafbd06744
@ -110,7 +110,7 @@ transformers.models.cohere.configuration_cohere.CohereConfig.base_model_tp_plan
|
|||||||
"layers.*.mlp.up_proj": "colwise",
|
"layers.*.mlp.up_proj": "colwise",
|
||||||
"layers.*.mlp.down_proj": "rowwise",
|
"layers.*.mlp.down_proj": "rowwise",
|
||||||
}
|
}
|
||||||
transformers.models.cohere.configuration_cohere2.Cohere2Config.base_model_tp_plan = {
|
transformers.models.cohere2.configuration_cohere2.Cohere2Config.base_model_tp_plan = {
|
||||||
"layers.*.self_attn.q_proj": "colwise",
|
"layers.*.self_attn.q_proj": "colwise",
|
||||||
"layers.*.self_attn.k_proj": "colwise",
|
"layers.*.self_attn.k_proj": "colwise",
|
||||||
"layers.*.self_attn.v_proj": "colwise",
|
"layers.*.self_attn.v_proj": "colwise",
|
||||||
|
Loading…
Reference in New Issue
Block a user