mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-19 22:02:06 +00:00
Update transformers_flash_causal_lm.py
This commit is contained in:
parent
de83178bc3
commit
bafbd06744
@ -110,7 +110,7 @@ transformers.models.cohere.configuration_cohere.CohereConfig.base_model_tp_plan
|
||||
"layers.*.mlp.up_proj": "colwise",
|
||||
"layers.*.mlp.down_proj": "rowwise",
|
||||
}
|
||||
transformers.models.cohere.configuration_cohere2.Cohere2Config.base_model_tp_plan = {
|
||||
transformers.models.cohere2.configuration_cohere2.Cohere2Config.base_model_tp_plan = {
|
||||
"layers.*.self_attn.q_proj": "colwise",
|
||||
"layers.*.self_attn.k_proj": "colwise",
|
||||
"layers.*.self_attn.v_proj": "colwise",
|
||||
|
Loading…
Reference in New Issue
Block a user