Skip to content

Commit 91d05e2

Browse files
Yejing-Laishenzheyu
authored andcommitted
Add DeepseekV3 AutoTP. (#7045)
Add deepseekv3 autotp. Signed-off-by: Lai, Yejing <[email protected]> Signed-off-by: Zheyu SHEN <[email protected]>
1 parent dddc7cf commit 91d05e2

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

deepspeed/module_inject/auto_tp.py

+2-1
Original file line numberDiff line numberDiff line change
@@ -137,7 +137,8 @@ def is_load_module(module):
137137
"LPLayerNorm", "SharedEmbedding", "OPTLearnedPositionalEmbedding", "LlamaRMSNorm", "FalconLinear",
138138
"MistralRMSNorm", "T5LayerNorm", "MixtralRMSNorm", "Phi3RotaryEmbedding", "Phi3SuScaledRotaryEmbedding",
139139
"Phi3RMSNorm", "YuanRMSNorm", "YuanRotaryEmbedding", "Phi3LongRoPEScaledRotaryEmbedding", "Qwen2RMSNorm",
140-
"DeepseekV2RMSNorm", "DeepseekV2YarnRotaryEmbedding", "MoEGate"
140+
"DeepseekV2RMSNorm", "DeepseekV3RMSNorm", "DeepseekV2YarnRotaryEmbedding", "DeepseekV3YarnRotaryEmbedding",
141+
"MoEGate"
141142
]
142143
return module.__class__ in load_layers or module._get_name() in load_layer_names
143144

0 commit comments

Comments
 (0)