Skip to content

Commit

Permalink
Add DeepseekV3 AutoTP. (deepspeedai#7045)
Browse files Browse the repository at this point in the history
Add deepseekv3 autotp.

Signed-off-by: Lai, Yejing <[email protected]>
Signed-off-by: gyou2021 <[email protected]>
  • Loading branch information
Yejing-Lai authored and gyou2021 committed Feb 28, 2025
1 parent 4cbc52c commit 586e436
Showing 1 changed file with 2 additions and 1 deletion.
3 changes: 2 additions & 1 deletion deepspeed/module_inject/auto_tp.py
Original file line number Diff line number Diff line change
Expand Up @@ -137,7 +137,8 @@ def is_load_module(module):
"LPLayerNorm", "SharedEmbedding", "OPTLearnedPositionalEmbedding", "LlamaRMSNorm", "FalconLinear",
"MistralRMSNorm", "T5LayerNorm", "MixtralRMSNorm", "Phi3RotaryEmbedding", "Phi3SuScaledRotaryEmbedding",
"Phi3RMSNorm", "YuanRMSNorm", "YuanRotaryEmbedding", "Phi3LongRoPEScaledRotaryEmbedding", "Qwen2RMSNorm",
"DeepseekV2RMSNorm", "DeepseekV2YarnRotaryEmbedding", "MoEGate"
"DeepseekV2RMSNorm", "DeepseekV3RMSNorm", "DeepseekV2YarnRotaryEmbedding", "DeepseekV3YarnRotaryEmbedding",
"MoEGate"
]
return module.__class__ in load_layers or module._get_name() in load_layer_names

Expand Down

0 comments on commit 586e436

Please sign in to comment.